curl http://127.0.0.1:9997/v1/completions -H "Content-Type: application/json" -d '{
        "model": "deepseek-r1",
	"size_in_billions": "671",
	"model_engine": "vllm",
	"model_format": "pytorch",
        "prompt": "San Francisco is a",
        "max_tokens": 1024,
        "temperature": 0.6,
	"ignore_eos": false,
	"stream": false
    }'
